class TimeEfficientInventory():
    #____________________________________________
    #initializes attributes: 
    # self.header, self.rows, self.id_to_row, self.prices, self.rows_by_price 
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign self.header
        header = data[0]
        self.header = header
        #___________
        #assign self.rows
        rows = data[1:] 
        self.rows = rows
        #_______________________________
        #convert price column to integer
        for row in rows:                                    #O(N)
            row[-1] = int(row[-1])                              #O(1)    
        #______________________           
        # assign self.id_to_row
        self.id_to_row = {}
        for row in rows:                                    #O(N)
            laptop_id = row[0]                                  #O(1)
            self.id_to_row[laptop_id] = row                     #O(1)
        #__________________________________________
        # assign self.prices, the set of all prices
        self.prices = set()
        for row in rows:                                    #O(N)
            self.prices.add(row[-1])                            #O(1)
        #_________________________________________
        # helper function which eats a row, 
        # and returns its price - used for self.rows_by_price
        def row_price(row):
            return row[-1]
        
        # assign self.rows_by_price, 
        # a sorted version of rows
        self.rows_by_price = sorted(rows, key = row_price)      #O(N log N)
        
    #______________________________________
    #______________________________________
    #given laptop_id, returns corresponding
    #row using dictionary self.id_to_row
    def get_laptop_from_id_fast(self, laptop_id):
        if laptop_id in self.id_to_row:                     #O(1) lookup time, since dictionary uses hash table
            return self.id_to_row[laptop_id]        
        return None
    
    #______________________________________
    #______________________________________
    #same function as check_promotion_dollars
    #uses the set of all prices self.prices
    def check_promotion_dollars_fast(self, dollars):
        if dollars in self.prices:                          #O(1)
            return True
        for row in self.rows:                               #O(N)
            if (dollars - row[-1]) in self.prices:              #O(1)
                return True  
        return False
    
    #_________________________________
    # uses self.rows_by_price to find first laptop outside
    # budget range in O(log N) time using a binary search
    def find_first_laptop_more_expensive(self, target_price):
        #initialize possible index range  
        lower_bound = 0
        upper_bound = len(self.rows_by_price) - 1          

        while lower_bound < upper_bound:                    #O(log N) <--- number of possible indices cut in half
            #guess item at midpoint of index range                          each iteration 
            guess = (upper_bound + lower_bound)//2          
            price = self.rows_by_price[guess][-1]
            #if guess was too big, decrease upper range
            if price > target_price:
                upper_bound = guess
            #if guess was too small, increase lower range
            else:
                lower_bound = guess + 1
           
           
        price = self.rows_by_price[lower_bound][-1]
        # if final guess is wrong, return -1 --> customer can afford all laptops
        if price <= target_price:
            return -1
        return lower_bound


import csv 
with open('laptops.csv', encoding = 'utf8') as file:
    data = list(csv.reader(file))           #read in data as list of lists
    header = data[0]                        #separate first item (header)
    rows = data[1:]                         #store remaining data


import pprint 
pp = pprint.PrettyPrinter(indent=4)
pp.pprint(header)
pp.pprint(rows[0:5])

[   'Id',
    'Company',
    'Product',
    'TypeName',
    'Inches',
    'ScreenResolution',
    'Cpu',
    'Ram',
    'Memory',
    'Gpu',
    'OpSys',
    'Weight',
    'Price']
[   [   '6571244',
        'Apple',
        'MacBook Pro',
        'Ultrabook',
        '13.3',
        'IPS Panel Retina Display 2560x1600',
        'Intel Core i5 2.3GHz',
        '8GB',
        '128GB SSD',
        'Intel Iris Plus Graphics 640',
        'macOS',
        '1.37kg',
        '1339'],
    [   '7287764',
        'Apple',
        'Macbook Air',
        'Ultrabook',
        '13.3',
        '1440x900',
        'Intel Core i5 1.8GHz',
        '8GB',
        '128GB Flash Storage',
        'Intel HD Graphics 6000',
        'macOS',
        '1.34kg',
        '898'],
    [   '3362737',
        'HP',
        '250 G6',
        'Notebook',
        '15.6',
        'Full HD 1920x1080',
        'Intel Core i5 7200U 2.5GHz',
        '8GB',
        '256GB SSD',
        'Intel HD Graphics 620',
        'No OS',
        '1.86kg',
        '575'],
    [   '9722156',
        'Apple',
        'MacBook Pro',
        'Ultrabook',
        '15.4',
        'IPS Panel Retina Display 2880x1800',
        'Intel Core i7 2.7GHz',
        '16GB',
        '512GB SSD',
        'AMD Radeon Pro 455',
        'macOS',
        '1.83kg',
        '2537'],
    [   '8550527',
        'Apple',
        'MacBook Pro',
        'Ultrabook',
        '13.3',
        'IPS Panel Retina Display 2560x1600',
        'Intel Core i5 3.1GHz',
        '8GB',
        '256GB SSD',
        'Intel Iris Plus Graphics 650',
        'macOS',
        '1.37kg',
        '1803']]


class Inventory():
    def __init__(self,csv_filename):
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        header = data[0]
        rows = data[1:]
        
        self.header = header
        for row in rows:
            row[-1] = int(row[-1])
        self.rows = rows


laptops = Inventory('laptops.csv')


print(laptops.header)
print(len(laptops.rows))

['Id', 'Company', 'Product', 'TypeName', 'Inches', 'ScreenResolution', 'Cpu', 'Ram', 'Memory', 'Gpu', 'OpSys', 'Weight', 'Price']
1303


class Inventory():
    #____________________________________________
    #initializes attributes self.header, self.rows
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign header
        header = data[0]
        self.header = header
        #___________
        #assign rows
        rows = data[1:] 
        self.rows = rows
        #_______________________________
        #convert price column to integer
        for row in rows:                                        #O(N)
            row[-1] = int(row[-1])                              #O(1)
        
    #______________________________________
    #______________________________________
    #given laptop_id, loops through rows, 
    #returns row with given laptop_id
    def get_laptop_from_id(self, laptop_id):
        for row in self.rows:                                   #O(N)
            if row[0] == laptop_id:                             #O(1)
                return row
        return None            #if no laptop found, return None


laptops = Inventory('laptops.csv')
print(laptops.get_laptop_from_id('3362737'))
print(laptops.get_laptop_from_id('3362736'))

['3362737', 'HP', '250 G6', 'Notebook', '15.6', 'Full HD 1920x1080', 'Intel Core i5 7200U 2.5GHz', '8GB', '256GB SSD', 'Intel HD Graphics 620', 'No OS', '1.86kg', 575]
None


class Inventory():
    #____________________________________________
    #initializes attributes: 
    # self.header, self.rows, self.id_to_row
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign header
        header = data[0]
        self.header = header
        #___________
        #assign rows
        rows = data[1:] 
        self.rows = rows
        #_______________________________
        #convert price column to integer
        for row in rows:                                    #O(N)
            row[-1] = int(row[-1])                              #O(1)    
        #______________________           
        # assign self.id_to_row
        self.id_to_row = {}
        for row in rows:                                    #O(N)
            laptop_id = row[0]                                  #O(1)
            self.id_to_row[laptop_id] = row                     #O(1)
        
    #______________________________________
    #______________________________________
    #given laptop_id, loops through rows, 
    #returns row with given laptop_id
    def get_laptop_from_id(self, laptop_id):
        for row in self.rows:                               #O(N)
            if row[0] == laptop_id:                             #O(1)
                return row
        return None            #if no laptop found, return None

    #______________________________________
    #______________________________________
    #given laptop_id, returns corresponding
    #row using dictionary self.id_to_row
    def get_laptop_from_id_fast(self, laptop_id):
        if laptop_id in self.id_to_row:                     #O(1) lookup time, since dictionary uses hash table
            return self.id_to_row[laptop_id]        
        return None


laptops = Inventory('laptops.csv')

print(laptops.get_laptop_from_id_fast('3362737'))

print(laptops.get_laptop_from_id_fast('3362736'))

['3362737', 'HP', '250 G6', 'Notebook', '15.6', 'Full HD 1920x1080', 'Intel Core i5 7200U 2.5GHz', '8GB', '256GB SSD', 'Intel HD Graphics 620', 'No OS', '1.86kg', 575]
None


import time,random

N = 1303                    #number of rows in our dataset
stepsize = 5                #time resolution 
num_trials = 50             #randomness resolution

time_complexity_no_dict = []        #empty lists for plotting data
time_complexity_dict = []
data_size = []

while N > 0:                        
    ids = [str(random.randint(1000000,9999999)) for _ in range(num_trials)]
    laptops = Inventory('laptops.csv')
    laptops.rows = laptops.rows[0:N]        #make laptop.rows a length of N

    total_time_no_dict = 0                  
    for id in ids:
        start = time.time()
        laptops.get_laptop_from_id(id)
        end = time.time()
        total_time_no_dict += (end - start)     #total time to call get_laptop_from_id() (num_trials) times

    mean_time_no_dict = total_time_no_dict/num_trials
    time_complexity_no_dict.append(mean_time_no_dict)   #append means to dataset
    
    total_time_dict = 0
    for id in ids:
        start = time.time()
        laptops.get_laptop_from_id_fast(id)
        end = time.time()
        total_time_dict += (end - start)           #total time to call get_laptop_from_id_fast() num_trials_times

    mean_time_dict = total_time_dict/num_trials
    time_complexity_dict.append(mean_time_dict)

    data_size.append(N)
    N = N - stepsize        #reduce N


import matplotlib.pyplot as plt
plt.style.use('fivethirtyeight')
#___________________________________________________________
#Initial Plot
fig,ax = plt.subplots(figsize = (12,8))
ax.plot(data_size,time_complexity_no_dict, linewidth = 2, alpha = .8, color = 'dodgerblue')
ax.plot(data_size,time_complexity_dict, linewidth = 2, color = 'darkviolet')
#____________________________________________________________
#Format grid, ticks, etc
ax.legend()
ax.set_xticks([0,400,800,1200])
ax.set_xticklabels(['0','400','800','1200 laptops'])
ax.set_yticks([0,.000020,.000040,.000060])
ax.set_xlim(right = 1350)
ax.set_yticklabels([])
ax.set_ylim(top = .000075)
ax.tick_params(colors = 'grey', which = 'both')
#___________________________________________________________
#create title,subtitle,signature bar
ax.text(-75,.000085, 'Storing Dictionary Results in Fast ID Lookups', weight = 'bold', size = 26, alpha = .75)
ax.text(-75,.000081, 'Time complexity comparison for ID lookups by looping through all', size = 19, alpha = .85)
ax.text(-75,.000078, 'rows (       ) and dictionary lookup (          ) ', size = 19, alpha = .85)
ax.text(x = -100, y = -.00002,
    s = '   J. Wilson Peoples                                                                                                                Source: Kaggle Laptop Prices Dataset ',
    fontsize = 12, color = '#f0f0f0', backgroundcolor = 'grey')
#_____________________________________________________________
#on figure annotations
ax.text(x = 35, y = .000078, s ='blue', color = 'dodgerblue', size = 19)
ax.text(x = 549, y = .000078, s ='purple', color = 'darkviolet', size = 19)

ax.annotate("", xy=(500, .00002), xytext=(220,.000035),
            arrowprops=dict(width = 1.5, color = 'grey',alpha = .5))

ax.text(x = -75, y = .000035, s ='complexity O(N)', color = 'grey', size = 19)
ax.text(x = 135, y = .000035, s ='O(N)', color = 'dodgerblue', size = 19)

No artists with labels found to put in legend.  Note that artists whose label start with an underscore are ignored when legend() is called with no argument.

Text(135, 3.5e-05, 'O(N)')


class Inventory():
    #____________________________________________
    #initializes attributes: 
    # self.header, self.rows, self.id_to_row
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign header
        header = data[0]
        self.header = header
        #___________
        #assign rows
        rows = data[1:] 
        self.rows = rows
        #_______________________________
        #convert price column to integer
        for row in rows:                                    #O(N)
            row[-1] = int(row[-1])                              #O(1)    
        #______________________           
        # assign self.id_to_row
        self.id_to_row = {}
        for row in rows:                                    #O(N)
            laptop_id = row[0]                                  #O(1)
            self.id_to_row[laptop_id] = row                     #O(1)
        
    #______________________________________
    #______________________________________
    #given laptop_id, loops through rows, 
    #returns row with given laptop_id
    def get_laptop_from_id(self, laptop_id):
        for row in self.rows:                               #O(N)
            if row[0] == laptop_id:                             #O(1)
                return row
        return None            #if no laptop found, return None

    #______________________________________
    #______________________________________
    #given laptop_id, returns corresponding
    #row using dictionary self.id_to_row
    def get_laptop_from_id_fast(self, laptop_id):
        if laptop_id in self.id_to_row:                     #O(1) lookup time, since dictionary uses hash table
            return self.id_to_row[laptop_id]        
        return None
    
    #______________________________________
    #______________________________________
    #given dollars, returns True or False
    #True: if exactly (dollars) can be spent
    # purchasing up to two laptops
    #False: otherwise
    def check_promotion_dollars(self, dollars):
        #see if any laptop costs exactly dollars
        for row in self.rows:                               #O(N)         
            if row[-1] == dollars:                              #O(1)
                return True
        #if not, check if two laptops have prices adding to dollars
        for row_1 in self.rows:                             #O(N)
            for row_2 in self.rows:                             #O(N) <---- total of O(N^2)
                if (row_1[-1] + row_2[-1] == dollars):
                    return True
        #if neither case above, return false
        return False


laptops = Inventory('laptops.csv')
print(laptops.check_promotion_dollars(1000))
print(laptops.check_promotion_dollars(442))

True
False


class Inventory():
    #____________________________________________
    #initializes attributes: 
    # self.header, self.rows, self.id_to_row, self.prices 
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign header
        header = data[0]
        self.header = header
        #___________
        #assign rows
        rows = data[1:] 
        self.rows = rows
        #_______________________________
        #convert price column to integer
        for row in rows:                                    #O(N)
            row[-1] = int(row[-1])                              #O(1)    
        #______________________           
        # assign self.id_to_row
        self.id_to_row = {}
        for row in rows:                                    #O(N)
            laptop_id = row[0]                                  #O(1)
            self.id_to_row[laptop_id] = row                     #O(1)

        # assign self.prices, the set of all prices
        self.prices = set()
        for row in rows:                                    #O(N)
            self.prices.add(row[-1])                            #O(1)
        
    #______________________________________
    #______________________________________
    #given laptop_id, loops through rows, 
    #returns row with given laptop_id
    def get_laptop_from_id(self, laptop_id):
        for row in self.rows:                               #O(N)
            if row[0] == laptop_id:                             #O(1)
                return row
        return None            #if no laptop found, return None

    #______________________________________
    #______________________________________
    #given laptop_id, returns corresponding
    #row using dictionary self.id_to_row
    def get_laptop_from_id_fast(self, laptop_id):
        if laptop_id in self.id_to_row:                     #O(1) lookup time, since dictionary uses hash table
            return self.id_to_row[laptop_id]        
        return None
    
    #______________________________________
    #______________________________________
    #given dollars, returns True or False
    #True: if exactly (dollars) can be spent
    # purchasing up to two laptops
    #False: otherwise
    def check_promotion_dollars(self, dollars):
        #see if any laptop costs exactly dollars
        for row in self.rows:                               #O(N)         
            if row[-1] == dollars:                              #O(1)
                return True
        #if not, check if two laptops have prices adding to dollars
        for row_1 in self.rows:                             #O(N)
            for row_2 in self.rows:                             #O(N) <---- total of O(N^2)
                if (row_1[-1] + row_2[-1] == dollars):
                    return True
        #if neither case above, return false
        return False
    #______________________________________
    #______________________________________
    #same function as check_promotion_dollars
    #uses the set of all prices self.prices
    def check_promotion_dollars_fast(self, dollars):
        if dollars in self.prices:                          #O(1)
            return True
        for row in self.rows:                               #O(N)
            if (dollars - row[-1]) in self.prices:              #O(1)
                return True  
        return False


laptops = Inventory('laptops.csv')
print(laptops.check_promotion_dollars_fast(1000))
print(laptops.check_promotion_dollars_fast(442))

True
False


import time,random

N = 1303                    #number of rows in our dataset
stepsize = 10              #time resolution 
num_trials = 100            #randomness resolution

time_complexity_no_set = []        #empty lists for plotting data
time_complexity_set = []
data_size = []

while N > 0:                        
    dollars_list = [random.randint(100,5000) for _ in range(num_trials)]
    laptops = Inventory('laptops.csv')
    laptops.rows = laptops.rows[0:N]        #make laptop.rows a length of N

    total_time_no_set = 0                  
    for dollars in dollars_list:
        start = time.time()
        laptops.check_promotion_dollars(dollars)
        end = time.time()
        total_time_no_set += (end - start)     #total time to call get_laptop_from_id() (num_trials) times

    mean_time_no_set = total_time_no_set/num_trials
    time_complexity_no_set.append(mean_time_no_set)   #append means to dataset
    
    total_time_set = 0
    for dollars in dollars_list:
        start = time.time()
        laptops.check_promotion_dollars_fast(dollars)
        end = time.time()
        total_time_set += (end - start)           #total time to call get_laptop_from_id_fast() num_trials_times

    mean_time_set = total_time_set/num_trials
    time_complexity_set.append(mean_time_set)

    data_size.append(N)
    N = N - stepsize        #reduce N


import matplotlib.pyplot as plt
#___________________________________________________________
#Initial Plot
fig,ax = plt.subplots(figsize = (12,8))
ax.plot(data_size,time_complexity_no_set, linewidth = 2, alpha = .8, color = 'orangered')
ax.plot(data_size,time_complexity_set, linewidth = 2, color = 'mediumseagreen')
#____________________________________________________________
#Format grid, ticks, etc
ax.legend()
ax.set_xticks([0,400,800,1200])
ax.set_xticklabels(['0','400','800','1200 laptops'])
ax.set_yticks([0,.0025,.005,.0075,.010])
ax.set_xlim(right = 1350)
ax.set_yticklabels([])
ax.set_ylim(top = .008)
ax.tick_params(colors = 'grey', which = 'both')
#___________________________________________________________
#create title,subtitle,signature bar
ax.text(-75,.0100, 'Storing A Set of Unique Prices Improves Performance ', weight = 'bold', size = 26, alpha = .75)
ax.text(-75,.0095, 'Time complexity comparison for valid promotion checking', size = 19, alpha = .85)
ax.text(-75,.00915, 'using brute force (orange) vs. pre-saving a set of prices (green) ', size = 19, alpha = .85)
ax.text(x = -100, y = -.002,
    s = '   J. Wilson Peoples                                                                                                                       Source: Kaggle Laptop Prices Dataset ',
    fontsize = 12, color = '#f0f0f0', backgroundcolor = 'grey')
#_____________________________________________________________
#on figure annotations
ax.text(x = 255, y = .00915, s ='orange', color = 'orangered', size = 19)
ax.text(x = 945, y = .00915, s ='green', color = 'mediumseagreen', size = 19)

No artists with labels found to put in legend.  Note that artists whose label start with an underscore are ignored when legend() is called with no argument.

Text(945, 0.00915, 'green')


class Inventory():
    #____________________________________________
    #initializes attributes: 
    # self.header, self.rows, self.id_to_row, self.prices, self.rows_by_price 
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign self.header
        header = data[0]
        self.header = header
        #___________
        #assign self.rows
        rows = data[1:] 
        self.rows = rows
        #_______________________________
        #convert price column to integer
        for row in rows:                                    #O(N)
            row[-1] = int(row[-1])                              #O(1)    
        #______________________           
        # assign self.id_to_row
        self.id_to_row = {}
        for row in rows:                                    #O(N)
            laptop_id = row[0]                                  #O(1)
            self.id_to_row[laptop_id] = row                     #O(1)
        #__________________________________________
        # assign self.prices, the set of all prices
        self.prices = set()
        for row in rows:                                    #O(N)
            self.prices.add(row[-1])                            #O(1)
        #_________________________________________
        # helper function which eats a row, 
        # and returns its price - used for self.rows_by_price
        def row_price(row):
            return row[-1]
        
        # assign self.rows_by_price, 
        # a sorted version of rows
        self.rows_by_price = sorted(rows, key = row_price)      #O(N log N)
        
        
    #______________________________________
    #______________________________________
    #given laptop_id, loops through rows, 
    #returns row with given laptop_id
    def get_laptop_from_id(self, laptop_id):
        for row in self.rows:                               #O(N)
            if row[0] == laptop_id:                             #O(1)
                return row
        return None            #if no laptop found, return None

    #______________________________________
    #______________________________________
    #given laptop_id, returns corresponding
    #row using dictionary self.id_to_row
    def get_laptop_from_id_fast(self, laptop_id):
        if laptop_id in self.id_to_row:                     #O(1) lookup time, since dictionary uses hash table
            return self.id_to_row[laptop_id]        
        return None
    
    #______________________________________
    #______________________________________
    #given dollars, returns True or False
    #True: if exactly (dollars) can be spent
    # purchasing up to two laptops
    #False: otherwise
    def check_promotion_dollars(self, dollars):
        #see if any laptop costs exactly dollars
        for row in self.rows:                               #O(N)         
            if row[-1] == dollars:                              #O(1)
                return True
        #if not, check if two laptops have prices adding to dollars
        for row_1 in self.rows:                             #O(N)
            for row_2 in self.rows:                             #O(N) <---- total of O(N^2)
                if (row_1[-1] + row_2[-1] == dollars):
                    return True
        #if neither case above, return false
        return False
    #______________________________________
    #______________________________________
    #same function as check_promotion_dollars
    #uses the set of all prices self.prices
    def check_promotion_dollars_fast(self, dollars):
        if dollars in self.prices:                          #O(1)
            return True
        for row in self.rows:                               #O(N)
            if (dollars - row[-1]) in self.prices:              #O(1)
                return True  
        return False


laptops = Inventory('laptops.csv')
for i in range(0,5):
    print(laptops.rows_by_price[i][-1])

174
191
196
199
199


class Inventory():
    #____________________________________________
    #initializes attributes: 
    # self.header, self.rows, self.id_to_row, self.prices, self.rows_by_price 
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign self.header
        header = data[0]
        self.header = header
        #___________
        #assign self.rows
        rows = data[1:] 
        self.rows = rows
        #_______________________________
        #convert price column to integer
        for row in rows:                                    #O(N)
            row[-1] = int(row[-1])                              #O(1)    
        #______________________           
        # assign self.id_to_row
        self.id_to_row = {}
        for row in rows:                                    #O(N)
            laptop_id = row[0]                                  #O(1)
            self.id_to_row[laptop_id] = row                     #O(1)
        #__________________________________________
        # assign self.prices, the set of all prices
        self.prices = set()
        for row in rows:                                    #O(N)
            self.prices.add(row[-1])                            #O(1)
        #_________________________________________
        # helper function which eats a row, 
        # and returns its price - used for self.rows_by_price
        def row_price(row):
            return row[-1]
        
        # assign self.rows_by_price, 
        # a sorted version of rows
        self.rows_by_price = sorted(rows, key = row_price)      #O(N log N)
        
        
    #______________________________________
    #______________________________________
    #given laptop_id, loops through rows, 
    #returns row with given laptop_id
    def get_laptop_from_id(self, laptop_id):
        for row in self.rows:                               #O(N)
            if row[0] == laptop_id:                             #O(1)
                return row
        return None            #if no laptop found, return None

    #______________________________________
    #______________________________________
    #given laptop_id, returns corresponding
    #row using dictionary self.id_to_row
    def get_laptop_from_id_fast(self, laptop_id):
        if laptop_id in self.id_to_row:                     #O(1) lookup time, since dictionary uses hash table
            return self.id_to_row[laptop_id]        
        return None
    
    #______________________________________
    #______________________________________
    #given dollars, returns True or False
    #True: if exactly (dollars) can be spent
    # purchasing up to two laptops
    #False: otherwise
    def check_promotion_dollars(self, dollars):
        #see if any laptop costs exactly dollars
        for row in self.rows:                               #O(N)         
            if row[-1] == dollars:                              #O(1)
                return True
        #if not, check if two laptops have prices adding to dollars
        for row_1 in self.rows:                             #O(N)
            for row_2 in self.rows:                             #O(N) <---- total of O(N^2)
                if (row_1[-1] + row_2[-1] == dollars):
                    return True
        #if neither case above, return false
        return False
    #______________________________________
    #______________________________________
    #same function as check_promotion_dollars
    #uses the set of all prices self.prices
    def check_promotion_dollars_fast(self, dollars):
        if dollars in self.prices:                          #O(1)
            return True
        for row in self.rows:                               #O(N)
            if (dollars - row[-1]) in self.prices:              #O(1)
                return True  
        return False
    
    #_________________________________
    # uses self.rows_by_price to find first laptop outside
    # budget range in O(log N) time using a binary search
    def find_first_laptop_more_expensive(self, target_price):
        #initialize possible index range  
        lower_bound = 0
        upper_bound = len(self.rows_by_price) - 1          

        while lower_bound < upper_bound:                    #O(log N) <--- number of possible indices cut in half
            #guess item at midpoint of index range                          each iteration 
            guess = (upper_bound + lower_bound)//2          
            price = self.rows_by_price[guess][-1]
            #if guess was too big, decrease upper range
            if price > target_price:
                upper_bound = guess
            #if guess was too small, increase lower range
            else:
                lower_bound = guess + 1
           
           
        price = self.rows_by_price[lower_bound][-1]
        # if final guess is wrong, return -1 --> customer can afford all laptops
        if price <= target_price:
            return -1
        return lower_bound


laptops = Inventory('laptops.csv')

print(laptops.find_first_laptop_more_expensive(1000))
print(laptops.find_first_laptop_more_expensive(10000))

683
-1


budget = 1000
start = time.time()
index = laptops.find_first_laptop_more_expensive(budget)
end = time.time()
print(laptops.rows_by_price[index])
print("query time:{time:.10f}".format(time = end - start))

['8747948', 'Lenovo', 'ThinkPad T460', 'Notebook', '14', '1366x768', 'Intel Core i5 6200U 2.3GHz', '4GB', '508GB Hybrid', 'Intel HD Graphics 520', 'Windows 7', '1.70kg', 1002]
query time:0.0000381470


laptops.rows_by_price[0:index][0:5] #just printing the first 5

[['3564228',
  'Acer',
  'C740-C9QX (3205U/2GB/32GB/Chrome',
  'Netbook',
  '11.6',
  '1366x768',
  'Intel Celeron Dual Core 3205U 1.5GHz',
  '2GB',
  '32GB SSD',
  'Intel HD Graphics',
  'Chrome OS',
  '1.3kg',
  174],
 ['7667029',
  'Asus',
  'Vivobook E200HA',
  'Netbook',
  '11.6',
  '1366x768',
  'Intel Atom x5-Z8350 1.44GHz',
  '2GB',
  '32GB Flash Storage',
  'Intel HD Graphics 400',
  'Windows 10',
  '0.98kg',
  191],
 ['1478754',
  'Vero',
  'V131 (X5-Z8350/4GB/32GB/FHD/W10)',
  'Notebook',
  '13.3',
  'Full HD 1920x1080',
  'Intel Atom X5-Z8350 1.44GHz',
  '4GB',
  '32GB Flash Storage',
  'Intel HD Graphics 400',
  'Windows 10',
  '1.35kg',
  196],
 ['4366200',
  'Asus',
  'E402WA-GA010T (E2-6110/2GB/32GB/W10)',
  'Notebook',
  '14',
  '1366x768',
  'AMD E-Series E2-6110 1.5GHz',
  '2GB',
  '32GB Flash Storage',
  'AMD Radeon R2',
  'Windows 10',
  '1.65kg',
  199],
 ['3840240',
  'Acer',
  'Chromebook C910-C2ST',
  'Notebook',
  '15.6',
  '1366x768',
  'Intel Celeron Dual Core 3205U 1.5GHz',
  '2GB',
  '16GB SSD',
  'Intel HD Graphics',
  'Chrome OS',
  '2.19kg',
  199]]


class TimeEfficientInventory():
    #____________________________________________
    #initializes attributes: 
    # self.header, self.rows, self.id_to_row, self.prices, self.rows_by_price 
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign self.header
        header = data[0]
        self.header = header
        #___________
        #assign self.rows
        rows = data[1:] 
        self.rows = rows
        #_______________________________
        #convert price column to integer
        for row in rows:                                    #O(N)
            row[-1] = int(row[-1])                              #O(1)    
        #______________________           
        # assign self.id_to_row
        self.id_to_row = {}
        for row in rows:                                    #O(N)
            laptop_id = row[0]                                  #O(1)
            self.id_to_row[laptop_id] = row                     #O(1)
        #__________________________________________
        # assign self.prices, the set of all prices
        self.prices = set()
        for row in rows:                                    #O(N)
            self.prices.add(row[-1])                            #O(1)
        #_________________________________________
        # helper function which eats a row, 
        # and returns its price - used for self.rows_by_price
        def row_price(row):
            return row[-1]
        
        # assign self.rows_by_price, 
        # a sorted version of rows
        self.rows_by_price = sorted(rows, key = row_price)      #O(N log N)
        
    #______________________________________
    #______________________________________
    #given laptop_id, returns corresponding
    #row using dictionary self.id_to_row
    def get_laptop_from_id_fast(self, laptop_id):
        if laptop_id in self.id_to_row:                     #O(1) lookup time, since dictionary uses hash table
            return self.id_to_row[laptop_id]        
        return None
    
    #______________________________________
    #______________________________________
    #same function as check_promotion_dollars
    #uses the set of all prices self.prices
    def check_promotion_dollars_fast(self, dollars):
        if dollars in self.prices:                          #O(1)
            return True
        for row in self.rows:                               #O(N)
            if (dollars - row[-1]) in self.prices:              #O(1)
                return True  
        return False
    
    #_________________________________
    # uses self.rows_by_price to find first laptop outside
    # budget range in O(log N) time using a binary search
    def find_first_laptop_more_expensive(self, target_price):
        #initialize possible index range  
        lower_bound = 0
        upper_bound = len(self.rows_by_price) - 1          

        while lower_bound < upper_bound:                    #O(log N) <--- number of possible indices cut in half
            #guess item at midpoint of index range                          each iteration 
            guess = (upper_bound + lower_bound)//2          
            price = self.rows_by_price[guess][-1]
            #if guess was too big, decrease upper range
            if price > target_price:
                upper_bound = guess
            #if guess was too small, increase lower range
            else:
                lower_bound = guess + 1
           
           
        price = self.rows_by_price[lower_bound][-1]
        # if final guess is wrong, return -1 --> customer can afford all laptops
        if price <= target_price:
            return -1
        return lower_bound


class MemoryEfficientInventory():
    #____________________________________________
    #initializes attributes: 
    # self.header, self.rows
    def __init__(self,csv_filename):
        #read file
        with open(csv_filename, encoding = 'utf8') as file:
            data = list(csv.reader(file))
        #_____________
        #assign self.header
        header = data[0]
        self.header = header
        #___________
        #assign self.rows
        rows = data[1:] 
        self.rows = rows   
        
    #______________________________________
    #______________________________________
    #given laptop_id, loops through rows, 
    #returns row with given laptop_id
    def get_laptop_from_id(self, laptop_id):
        for row in self.rows:                               #O(N)
            if row[0] == laptop_id:                             #O(1)
                return row
        return None            #if no laptop found, return None
    
    #______________________________________
    #______________________________________
    #given dollars, returns True or False
    #True: if exactly (dollars) can be spent
    # purchasing up to two laptops
    #False: otherwise
    def check_promotion_dollars(self, dollars):
        #see if any laptop costs exactly dollars
        for row in self.rows:                               #O(N)         
            if int(row[-1]) == dollars:                              #O(1)
                return True
        #if not, check if two laptops have prices adding to dollars
        for row_1 in self.rows:                             #O(N)
            for row_2 in self.rows:                             #O(N) <---- total of O(N^2)
                if (int(row_1[-1]) + int(row_2[-1]) == dollars):
                    return True
        #if neither case above, return false
        return False

Column name	Description
ID	A unique identifier for the laptop.
Company	The name of the company that produces the laptop.
Product	The name of the laptop.
TypeName	The type of laptop.
Inches	The size of the screen in inches.
ScreenResolution	The resolution of the screen.
CPU	The laptop CPU.
RAM	The amount of RAM in the laptop.
Memory	The size of the hard drive.
GPU	The graphics card name.
OpSys	The name of the operating system.
Weight	The laptop weight.
Price	The price of the laptop.

Building Fast Queries on a CSV¶

Summary¶

About the Data¶

Reading in the Dataset¶

Building an Inventory Class¶

Two ID Search Methods: Time and Space Complexity Analysis¶

Maximizing Promotion Dollars Spent¶

Finding Laptops Within Budget¶

Space/Time Complexity Tradeoffs¶

Conlusion¶